'''
读取素材中的“test.txt”文件，使用jieba库进行分词，
并将出现次数前5的词汇和出现次数信息写入到“output.txt”文件中
'''
import jieba
# 去除空格
exclude={' '}

txt = open('test.txt','r',encoding='UTF-8').read()
txt2 = open('output.txt','w+')
words=jieba.lcut(txt)
counts={}
for word in words:
    if len(word)==1:
        continue
    else:
        counts[word] = counts.get(word,0)+1
items = list(counts.items())
items.sort(key=lambda x:x[1],reverse=True)
# 获取前5个词汇      
for i in range(5):
    word,count=items[i]
    # 将词汇写入output.txt文件中
    txt2.write(word)
# 关闭文档
txt2.close()
